% Encoding: UTF-8

@Article{srivastava2014dropout,
  author    = {Srivastava, Nitish and Hinton, Geoffrey and Krizhevsky, Alex and Sutskever, Ilya and Salakhutdinov, Ruslan},
  journal   = {The journal of machine learning research},
  title     = {Dropout: a simple way to prevent neural networks from overfitting},
  year      = {2014},
  number    = {1},
  pages     = {1929--1958},
  volume    = {15},
  publisher = {JMLR. org},
}

@InProceedings{he2016deep,
  author    = {He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
  booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition},
  title     = {Deep residual learning for image recognition},
  year      = {2016},
  pages     = {770--778},
}

@Article{simonyan2014very,
  author  = {Simonyan, Karen and Zisserman, Andrew},
  journal = {arXiv preprint arXiv:1409.1556},
  title   = {Very deep convolutional networks for large-scale image recognition},
  year    = {2014},
}

@InProceedings{szegedy2015going,
  author    = {Szegedy, Christian and Liu, Wei and Jia, Yangqing and Sermanet, Pierre and Reed, Scott and Anguelov, Dragomir and Erhan, Dumitru and Vanhoucke, Vincent and Rabinovich, Andrew},
  booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition},
  title     = {Going deeper with convolutions},
  year      = {2015},
  pages     = {1--9},
}

@InProceedings{Vaswani2017,
  author    = {Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, \L ukasz and Polosukhin, Illia},
  booktitle = {Advances in Neural Information Processing Systems},
  title     = {Attention is All you Need},
  year      = {2017},
  publisher = {Curran Associates, Inc.},
  volume    = {30},
}

@InProceedings{Devlin2019,
  author    = {Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
  booktitle = {Proceedings of NAACL-HLT},
  title     = {BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding},
  year      = {2019},
  pages     = {4171--4186},
}

@Article{mikolov2013efficient,
  author  = {Mikolov, Tomas and Chen, Kai and Corrado, Greg and Dean, Jeffrey},
  journal = {arXiv preprint arXiv:1301.3781},
  title   = {Efficient estimation of word representations in vector space},
  year    = {2013},
}

@Article{goodfellow2014explaining,
  author  = {Goodfellow, Ian J and Shlens, Jonathon and Szegedy, Christian},
  journal = {arXiv preprint arXiv:1412.6572},
  title   = {Explaining and harnessing adversarial examples},
  year    = {2014},
}

@InProceedings{frankle2018lottery,
  author    = {Frankle, Jonathan and Carbin, Michael},
  booktitle = {International Conference on Learning Representations},
  title     = {The Lottery Ticket Hypothesis: Finding Sparse, Trainable Neural Networks},
  year      = {2018},
}

@InProceedings{Hinton2015,
  author    = {Geoffrey Hinton and Oriol Vinyals and Jeffrey Dean},
  booktitle = {NIPS Deep Learning and Representation Learning Workshop},
  title     = {Distilling the Knowledge in a Neural Network},
  year      = {2015},
  url       = {http://arxiv.org/abs/1503.02531},
}

@InProceedings{chollet2017xception,
  author    = {Chollet, Fran{\c{c}}ois},
  booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition},
  title     = {Xception: Deep learning with depthwise separable convolutions},
  year      = {2017},
  pages     = {1251--1258},
}

@InProceedings{yosinskiunderstanding,
  author       = {Yosinski, Jason and Clune, Jeff and Fuchs, Thomas and Lipson, Hod},
  booktitle    = {In ICML Workshop on Deep Learning},
  title        = {Understanding neural networks through deep visualization},
  organization = {Citeseer},
}

@InProceedings{zeiler2014visualizing,
  author       = {Zeiler, Matthew D and Fergus, Rob},
  booktitle    = {European conference on computer vision},
  title        = {Visualizing and understanding convolutional networks},
  year         = {2014},
  organization = {Springer},
  pages        = {818--833},
}

@Article{ganin2016domain,
  author    = {Ganin, Yaroslav and Ustinova, Evgeniya and Ajakan, Hana and Germain, Pascal and Larochelle, Hugo and Laviolette, Fran{\c{c}}ois and Marchand, Mario and Lempitsky, Victor},
  journal   = {The journal of machine learning research},
  title     = {Domain-adversarial training of neural networks},
  year      = {2016},
  number    = {1},
  pages     = {2096--2030},
  volume    = {17},
  publisher = {JMLR. org},
}

@Comment{jabref-meta: databaseType:bibtex;}
